MASTER_URL = spark://kurgan:7077

PYSPARK = pyspark
text_file = data.txt
vocab_file = vocab.txt
enc_file_learn = encdata_learn.txt
enc_file_class = encdata_class.txt
n = 150
# limit the number of sentences, beyond 200k, things move slow
m = 200000

all:
	$(PYSPARK) ./enc_semap.py $(text_file) $(n) $(m) $(vocab_file) $(enc_file_learn) $(enc_file_class) $(MASTER_URL)

clean:
	rm -f $(vocab_file) $(enc_file_learn) $(enc_file_class) nohup.out


